installing the packages

install.packages("outliers")
install.packages("scatterplot3d") 
install.packages("dplyr")
install.packages("ggplot2")
install.packages("colorspace")

reading libraries and the dataset

library(ggplot2)
library(outliers)
library(scatterplot3d)
library(dplyr)
library(readr)
dataset <- read_csv("salary.csv")
Rows: 32561 Columns: 15── Column specification ─────────────────────────────────────────────────────────────────────────────
Delimiter: ","
chr (9): workclass, education, marital-status, occupation, relationship, race, sex, native-countr...
dbl (6): age, fnlwgt, education-num, capital-gain, capital-loss, hours-per-week
ℹ Use `spec()` to retrieve the full column specification for this data.
ℹ Specify the column types or set `show_col_types = FALSE` to quiet this message.
View(dataset)

Sample of raw dataset and summary

View(dataset)
summary(dataset)
      age         workclass             fnlwgt         education         education-num  
 Min.   :17.00   Length:32561       Min.   :  12285   Length:32561       Min.   : 1.00  
 1st Qu.:28.00   Class :character   1st Qu.: 117827   Class :character   1st Qu.: 9.00  
 Median :37.00   Mode  :character   Median : 178356   Mode  :character   Median :10.00  
 Mean   :38.58                      Mean   : 189778                      Mean   :10.08  
 3rd Qu.:48.00                      3rd Qu.: 237051                      3rd Qu.:12.00  
 Max.   :90.00                      Max.   :1484705                      Max.   :16.00  
 marital-status      occupation        relationship           race               sex           
 Length:32561       Length:32561       Length:32561       Length:32561       Length:32561      
 Class :character   Class :character   Class :character   Class :character   Class :character  
 Mode  :character   Mode  :character   Mode  :character   Mode  :character   Mode  :character  
                                                                                               
                                                                                               
                                                                                               
  capital-gain    capital-loss    hours-per-week  native-country        salary         
 Min.   :    0   Min.   :   0.0   Min.   : 1.00   Length:32561       Length:32561      
 1st Qu.:    0   1st Qu.:   0.0   1st Qu.:40.00   Class :character   Class :character  
 Median :    0   Median :   0.0   Median :40.00   Mode  :character   Mode  :character  
 Mean   : 1078   Mean   :  87.3   Mean   :40.44                                        
 3rd Qu.:    0   3rd Qu.:   0.0   3rd Qu.:45.00                                        
 Max.   :99999   Max.   :4356.0   Max.   :99.00                                        

encoding

dataset$workclass <-  as.integer(factor(dataset$workclass))
dataset$marital.status <-  as.integer(factor(dataset$`marital-status`))
dataset$occupation <-  as.integer(factor(dataset$occupation))
dataset$relationship <-  as.integer(factor(dataset$workclass))
dataset$race <-  as.integer(factor(dataset$race))
dataset$sex <-  as.integer(factor(dataset$sex))
dataset$native.country <-  as.integer(factor(dataset$`native-country`))
print(dataset)

Missing values

sum(is.na(dataset))
[1] 0

we noticed that there is a question mark in some values although we checked the missing values in previous part and the resault was 0 so we are going to clean them by deleting the row

dataset <- dataset[!apply(dataset == "?", 1, any), ]
print(dataset)

removing outliers

OutAge = outlier(dataset$age, logical =TRUE)
sum(OutAge)
[1] 42
Find_outlier = which(OutAge ==TRUE, arr.ind = TRUE)
OutAge
   [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [16] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [31] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [46] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [61] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [76] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [91] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [106] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [121] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [136] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [151] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [166] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [181] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [196] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [211] FALSE FALSE FALSE FALSE FALSE FALSE FALSE  TRUE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [226] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [241] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [256] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [271] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [286] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [301] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [316] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [331] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [346] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [361] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [376] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [391] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [406] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [421] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [436] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [451] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [466] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [481] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [496] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [511] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [526] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [541] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [556] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [571] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [586] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [601] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [616] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [631] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [646] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [661] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [676] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [691] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [706] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [721] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [736] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [751] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [766] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [781] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [796] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [811] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [826] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [841] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [856] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [871] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [886] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [901] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [916] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [931] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [946] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [961] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [976] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [991] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [ reached getOption("max.print") -- omitted 30978 entries ]
Find_outlier
 [1]   218  1021  1898  2261  2836  3993  4032  5007  5171  5267  5301  6112  6497  8646  8800  8810
[17] 10026 10355 11307 11522 11785 12231 12743 13905 15082 15606 18087 18392 18499 18872 19141 19393
[33] 20243 21828 23614 23808 24852 27958 30473 31129 31702 31791
####
Outfnlwgt = outlier(dataset$fnlwgt, logical =TRUE)
sum(Outfnlwgt)
[1] 1
Find_outlier = which(Outfnlwgt ==TRUE, arr.ind = TRUE)
Outfnlwgt
   [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [16] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [31] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [46] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [61] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [76] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [91] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [106] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [121] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [136] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [151] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [166] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [181] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [196] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [211] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [226] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [241] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [256] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [271] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [286] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [301] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [316] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [331] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [346] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [361] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [376] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [391] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [406] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [421] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [436] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [451] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [466] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [481] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [496] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [511] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [526] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [541] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [556] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [571] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [586] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [601] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [616] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [631] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [646] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [661] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [676] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [691] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [706] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [721] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [736] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [751] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [766] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [781] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [796] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [811] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [826] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [841] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [856] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [871] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [886] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [901] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [916] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [931] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [946] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [961] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [976] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [991] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [ reached getOption("max.print") -- omitted 30978 entries ]
###
Outeducation = outlier(dataset$`education-num`, logical =TRUE)
sum(Outeducation)
[1] 50
Find_outlier = which(Outeducation ==TRUE, arr.ind = TRUE)
Outeducation
   [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [16] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [31] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [46] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [61] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [76] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [91] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [106] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [121] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [136] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [151] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [166] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [181] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [196] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [211] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE  TRUE FALSE FALSE FALSE FALSE FALSE
 [226] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [241] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [256] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [271] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [286] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [301] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [316] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [331] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [346] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [361] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [376] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [391] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [406] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [421] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [436] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [451] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [466] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [481] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [496] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [511] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [526] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [541] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [556] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [571] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [586] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [601] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [616] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [631] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [646] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [661] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [676] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [691] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [706] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [721] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [736] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [751] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [766] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [781] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [796] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [811] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [826] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [841] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [856] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [871] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [886] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [901] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [916]  TRUE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [931] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [946] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [961] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [976] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [991] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [ reached getOption("max.print") -- omitted 30978 entries ]
##

Outhours = outlier(dataset$`hours-per-week`, logical =TRUE)
sum(Outhours)
[1] 83
Find_outlier = which(Outhours ==TRUE, arr.ind = TRUE)
Outhours
   [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [16] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [31] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [46] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [61] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [76] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [91] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [106] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [121] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [136] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [151] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [166] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [181] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [196] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [211] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [226] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [241] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [256] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [271] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [286] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [301] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [316] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [331] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [346] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [361] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [376] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [391] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [406] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [421] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [436] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [451] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [466] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [481] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [496] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [511] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [526] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [541] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [556] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [571] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [586] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [601] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [616] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [631] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [646] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [661] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [676] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [691] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [706] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [721] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [736] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [751] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [766] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [781] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [796] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [811] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [826] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [841] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [856] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [871] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [886] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [901] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [916] FALSE FALSE FALSE  TRUE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [931] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [946] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [961] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [976] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [991] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [ reached getOption("max.print") -- omitted 30978 entries ]
###
OutcapitalG = outlier(dataset$`capital-gain`, logical =TRUE)
sum(OutcapitalG)
[1] 152
Find_outlier = which(OutcapitalG ==TRUE, arr.ind = TRUE)
OutcapitalG
   [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [16] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [31] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [46] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [61] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [76] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [91] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [106] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [121] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [136] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [151] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [166] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [181] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [196] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [211] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [226] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [241] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [256] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [271] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [286] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [301] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [316] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [331] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [346] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [361] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [376] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [391] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [406] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [421] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [436] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [451] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [466] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [481] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [496] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [511] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [526] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [541] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [556] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [571] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [586] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [601] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [616] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [631] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [646] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [661] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [676] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [691] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [706] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [721] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [736] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [751] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [766] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [781] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [796] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [811] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [826] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [841] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [856] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [871] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [886] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [901] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [916] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [931] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [946] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [961] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [976] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [991] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [ reached getOption("max.print") -- omitted 30978 entries ]
###
OutcapitalL = outlier(dataset$`capital-loss`, logical =TRUE)
sum(OutcapitalL)
[1] 3
Find_outlier = which(OutcapitalL ==TRUE, arr.ind = TRUE)
OutcapitalL
   [1] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [16] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [31] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [46] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [61] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [76] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
  [91] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [106] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [121] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [136] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [151] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [166] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [181] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [196] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [211] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [226] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [241] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [256] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [271] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [286] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [301] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [316] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [331] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [346] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [361] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [376] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [391] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [406] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [421] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [436] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [451] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [466] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [481] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [496] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [511] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [526] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [541] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [556] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [571] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [586] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [601] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [616] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [631] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [646] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [661] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [676] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [691] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [706] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [721] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [736] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [751] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [766] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [781] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [796] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [811] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [826] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [841] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [856] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [871] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [886] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [901] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [916] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [931] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [946] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [961] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [976] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [991] FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE FALSE
 [ reached getOption("max.print") -- omitted 30978 entries ]
#Remove outlier
dataset= dataset[-Find_outlier,]

printing the dataset after cleaning the data

print(dataset)

Create a new column called num_salary to transform the binary attribute into numrical to use it better as it it the class label

dataset$num_salary <- ifelse(dataset$salary == ">50K", 1, 0)

Data summary

summary(dataset$age)
   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
  17.00   28.00   37.00   38.58   48.00   90.00 
summary(dataset$`hours-per-week`)
   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
   1.00   40.00   40.00   40.42   45.00   99.00 
summary(dataset$education)
   Length     Class      Mode 
    31975 character character 
summary(dataset$occupation)
   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
  1.000   4.000   8.000   7.565  11.000  15.000 
summary(dataset$sex)
   Min. 1st Qu.  Median    Mean 3rd Qu.    Max. 
  1.000   1.000   2.000   1.668   2.000   2.000 
summary(dataset$salary)
   Length     Class      Mode 
    31975 character character 

variance

var(dataset$age)
[1] 172.4622
var(dataset$`hours-per-week`)
[1] 143.5073

Discretize the hours-per-week into three bins

dataset$hours_per_week_binned <- cut(dataset$`hours-per-week`, breaks = c(0, 30, 40, Inf), labels = c("Low", "Medium", "High"))
print(dataset$hours_per_week_binned)
   [1] Medium Low    Medium Medium Medium Medium Low    High   High   Medium High   Medium Low   
  [14] High   High   Medium Medium High   High   High   Low    Medium Medium Medium Medium Medium
  [27] High   High   Medium High   High   Medium Medium Low    Medium Medium Low    Medium High  
  [40] Medium High   Medium Medium Medium Medium Medium Medium High   Medium High   High   High  
  [53] Medium Medium Medium High   Medium Medium Medium High   High   Medium Medium Medium High  
  [66] Medium Medium Medium High   Medium Low    Medium Medium Low    Low    Medium Low    Medium
  [79] Medium High   Medium Medium Medium High   Medium High   Medium Medium Low    Medium High  
  [92] High   High   Medium Medium Medium High   High   Medium Medium Medium Medium Medium Medium
 [105] Medium Medium Medium High   Low    Medium High   High   Medium High   High   Medium High  
 [118] Medium High   Medium Medium Low    Medium Medium Medium High   Medium Medium High   Medium
 [131] Medium High   Medium Low    Medium Medium Medium Low    Medium Medium Low    Low    Low   
 [144] Medium Medium Medium Medium Medium Medium High   High   Medium Low    High   High   Low   
 [157] Medium Medium Medium Medium Medium High   Medium Low    Low    Medium Medium Medium High  
 [170] Medium Low    Medium Medium Low    High   Medium Medium High   Medium High   Medium Medium
 [183] High   High   Low    Low    Medium Medium High   Low    Medium Medium High   Medium Medium
 [196] Medium Medium High   Medium Medium Medium Medium High   Medium Low    Medium Medium Medium
 [209] Medium Medium High   Medium High   High   Medium Medium Medium Medium Low    Medium Medium
 [222] Low    High   Low    Medium Medium Medium High   Medium High   Medium Medium High   High  
 [235] Medium Medium Low    High   Low    Medium High   Medium High   Medium Medium Low    Medium
 [248] Low    Medium Medium Low    High   Medium Medium High   Low    Medium Medium High   Low   
 [261] Medium High   Medium Medium Low    High   Medium Medium Medium Medium Medium Medium High  
 [274] Low    Medium High   High   Medium Medium High   High   Medium Medium High   Medium High  
 [287] High   Medium Low    High   Medium High   Medium Low    High   Medium Medium Medium High  
 [300] Medium Medium High   Medium Medium Low    Medium Low    Medium Medium Medium Medium Low   
 [313] Medium High   High   Medium Low    High   Low    High   Medium High   High   Medium Medium
 [326] Medium Medium High   Medium High   Low    Medium Medium Medium Medium Low    Medium High  
 [339] Low    Medium Low    Low    Medium Medium Medium Low    Medium Medium Medium Medium Medium
 [352] Medium Low    Medium High   High   High   Medium High   Low    High   Medium Low    Low   
 [365] Medium Medium Medium Low    Medium Medium Low    High   Medium High   Medium Medium Medium
 [378] Low    Medium Low    Low    Medium Medium High   Medium Medium Medium Medium Medium High  
 [391] High   Medium Medium Medium High   Medium High   Medium Low    Medium High   Low    Medium
 [404] Medium High   Medium High   Medium Low    Medium Medium Low    Low    Medium Medium Medium
 [417] High   Medium High   Medium Medium Low    Medium Medium Low    Medium High   High   Medium
 [430] Medium Medium Medium Low    Medium Medium Medium Medium Medium Medium Medium Low    Medium
 [443] High   Medium Medium Medium Medium High   High   Medium Medium Medium High   Medium Low   
 [456] High   Medium Medium High   Low    Medium Medium Medium High   Low    Medium Low    Low   
 [469] Medium Medium High   Low    Low    Medium Medium Low    Medium High   Medium High   Medium
 [482] Medium High   Low    Low    Medium Medium Medium Medium Low    Medium Medium Medium High  
 [495] Medium Medium Low    Medium Medium Medium High   Low    High   High   High   Medium Low   
 [508] Low    Medium High   High   High   High   High   High   Medium Medium Low    High   Medium
 [521] High   Medium Medium High   High   High   Low    Medium High   Medium Medium Medium Medium
 [534] Medium High   High   Low    Medium Medium Medium High   Medium Medium Medium Medium Medium
 [547] Medium Medium Medium High   Medium High   Medium High   High   High   Medium Medium High  
 [560] Medium Medium Low    Medium High   Medium Low    Medium Medium High   Low    Medium Medium
 [573] Medium Medium Low    High   Medium High   High   Medium Medium High   Medium Medium Medium
 [586] Low    High   Medium High   Medium Low    Medium Medium Medium Medium Medium Medium Medium
 [599] Low    High   Medium High   Medium Low    High   High   Medium High   High   Low    Low   
 [612] Low    High   Medium High   High   High   Medium Low    Medium Medium High   Medium High  
 [625] Low    Medium High   High   High   High   Medium Medium High   High   Medium Medium Low   
 [638] High   Medium Low    High   Medium High   Medium Medium Low    High   Medium Medium Medium
 [651] High   Medium Medium Low    Medium Medium Medium Medium Medium Medium Low    Low    Medium
 [664] High   Medium Low    Medium High   High   High   Medium Medium Medium Low    Medium Low   
 [677] High   Medium Low    Medium High   High   Low    Low    High   High   Medium Medium Low   
 [690] High   Medium Low    Medium High   High   Medium Medium Medium Low    Medium Medium Medium
 [703] Medium Medium Medium Medium Low    High   Medium High   Medium High   High   Medium Low   
 [716] Medium Low    Medium High   Low    Medium Medium Medium High   Low    Medium Low    High  
 [729] High   Medium Low    Medium Medium Medium Medium Medium Medium Low    Medium High   Medium
 [742] Medium Medium High   Medium Medium Low    Medium Medium High   High   High   Medium Low   
 [755] High   Medium Medium Medium High   Low    Medium High   Medium High   Medium High   High  
 [768] High   High   Medium High   Low    Low    Medium High   Medium Medium Medium High   Low   
 [781] Medium Medium Medium Medium Medium Low    Low    Medium Low    High   Medium High   Medium
 [794] Low    Medium Medium High   Medium Low    High   High   High   High   High   Medium High  
 [807] Medium Medium High   High   Medium Low    Low    Medium Low    Medium Medium Medium Low   
 [820] Medium Medium High   High   Low    Low    High   Medium High   Medium Medium High   High  
 [833] Medium Low    Medium High   High   Medium High   Medium Medium Medium Medium High   Low   
 [846] Medium High   High   Medium Low    Medium Low    High   Medium Medium High   Medium Medium
 [859] Low    High   Low    Medium Medium Low    Medium Medium High   High   High   Low    Low   
 [872] Medium High   Low    Medium Medium High   High   Medium High   High   High   Medium High  
 [885] Low    Medium Medium High   Medium High   Low    Low    Medium Low    High   High   Medium
 [898] Medium High   High   Medium Low    Low    Low    Medium Medium Medium Low    Medium Medium
 [911] High   High   Medium High   Low    Medium Medium High   High   Low    Medium Low    Medium
 [924] Medium Medium Medium High   Medium Medium Medium High   Medium Medium Medium High   Medium
 [937] Low    Medium High   Medium Medium Medium High   Medium High   Medium Medium Low    High  
 [950] Low    Medium Low    Medium Medium Medium Medium High   Medium Medium Medium Medium Medium
 [963] High   Medium Medium High   Medium Low    Medium Medium Medium Medium Medium Medium Low   
 [976] High   High   High   High   High   Medium High   Medium High   Medium High   Low    Medium
 [989] Medium Medium High   High   Medium Medium Medium High   Low    Medium Medium Medium
 [ reached getOption("max.print") -- omitted 30975 entries ]
Levels: Low Medium High

Create a density plot for the age variable

ggplot(dataset, aes(x = age)) +
  geom_density()

histograms

# Histogram of the age variable
ggplot(dataset, aes(x = age)) +
  geom_histogram()


# Histogram of the num_salary variable where the 1 represents salary >=50k and 0 represents salary <50k
ggplot(dataset, aes(x = num_salary)) +
  geom_histogram()


# Histogram of the hours-per-week variable
ggplot(dataset, aes(x = `hours-per-week`)) +
  geom_histogram()


# Histogram of the fnlwgt variable
ggplot(dataset, aes(x = fnlwgt)) +
  geom_histogram()

bar plots

# Bar plot of the workclass variable
ggplot(dataset, aes(x = workclass)) + geom_bar()


# Bar plot of the education variable
ggplot(dataset, aes(x = education)) + geom_bar()


# Bar plot of the marital-status variable
ggplot(dataset, aes(x = `marital-status`)) + geom_bar()


# Bar plot of the occupation variable
ggplot(dataset, aes(x = occupation)) + geom_bar()


# Bar plot of the relationship variable
ggplot(dataset, aes(x = relationship)) + geom_bar()


# Bar plot of the sex variable
ggplot(dataset, aes(x = sex)) +geom_bar()


# Bar plot of the native-country variable
ggplot(dataset, aes(x = `native-country`)) + geom_bar()


# Bar plot of the salary variable
ggplot(dataset, aes(x = salary)) + geom_bar()

box plot

ggplot(dataset, aes(x = salary, y = `hours-per-week`)) +
  geom_boxplot() +
  labs(title = "Box Plot of Salary and Hours per Week", x = "Salary", y = "Hours per Week")



ggplot(dataset, aes(x = salary, y = age)) +
  geom_boxplot() +
  labs(title = "Box Plot of Age and Salary", x = "salary", y = "age")

scatter plot

scatterplot3d(dataset$num_salary,dataset$age, dataset$`hours-per-week`)

pie chart for the salary attribute

tab <- dataset$salary %>% table()
precentages <- tab %>% prop.table() %>% round(3) * 100 
txt <- paste0(names(tab), '\n', precentages, '%') 
pie(tab, labels=txt)

Normalization

dataWithoutNormalization <- dataset
print(dataWithoutNormalization)
#Define function normalize().
normalize <- function(x) {return ((x - min(x)) / (max(x) - min(x)))}
#Define function Z_normalize().
Z_normalize <- function(x) {return ((x - mean(x)) / sd(x))}

#Call normalize funcrtion 
dataset$age<-normalize(dataWithoutNormalization$age)
print(dataset)

#Call Z_normalize funcrtion 
dataset$age<-Z_normalize(dataWithoutNormalization$age)
print(dataset)

######################################

#Call normalize funcrtion 
dataset$fnlwgt<-normalize(dataWithoutNormalization$fnlwgt)
print(dataset)

#Call Z_normalize funcrtion 
dataset$fnlwgt<-Z_normalize(dataWithoutNormalization$fnlwgt)
print(dataset)

######################################

#Call normalize funcrtion 
dataset$`education-num`<-normalize(dataWithoutNormalization$`education-num`)
print(dataset)

#Call Z_normalize funcrtion 
dataset$`education-num`<-Z_normalize(dataWithoutNormalization$`education-num`)
print(dataset)

######################################



#Call normalize funcrtion 
dataset$`hours-per-week`<-normalize(dataWithoutNormalization$`hours-per-week`)
print(dataset)

#Call Z_normalize funcrtion 
dataset$`hours-per-week`<-Z_normalize(dataWithoutNormalization$`hours-per-week`)
print(dataset)

######################################

#Call normalize funcrtion 
dataset$`capital-gain`<-normalize(dataWithoutNormalization$`capital-gain`)
print(dataset)

#Call Z_normalize funcrtion 
dataset$`capital-gain`<-Z_normalize(dataWithoutNormalization$`capital-gain`)
print(dataset)

######################################

#Call normalize funcrtion 
dataset$`capital-loss`<-normalize(dataWithoutNormalization$`capital-loss`)
print(dataset)

#Call Z_normalize funcrtion 
dataset$`capital-loss`<-Z_normalize(dataWithoutNormalization$`capital-loss`)
print(dataset)
NA
LS0tDQp0aXRsZTogInBoYXNlIDEiDQpvdXRwdXQ6IGh0bWxfbm90ZWJvb2sNCi0tLQ0KDQppbnN0YWxsaW5nIHRoZSBwYWNrYWdlcw0KYGBge3J9DQppbnN0YWxsLnBhY2thZ2VzKCJvdXRsaWVycyIpDQppbnN0YWxsLnBhY2thZ2VzKCJzY2F0dGVycGxvdDNkIikgDQppbnN0YWxsLnBhY2thZ2VzKCJkcGx5ciIpDQppbnN0YWxsLnBhY2thZ2VzKCJnZ3Bsb3QyIikNCmluc3RhbGwucGFja2FnZXMoImNvbG9yc3BhY2UiKQ0KDQpgYGANCnJlYWRpbmcgbGlicmFyaWVzIGFuZCB0aGUgZGF0YXNldA0KYGBge3J9DQpsaWJyYXJ5KGdncGxvdDIpDQpsaWJyYXJ5KG91dGxpZXJzKQ0KbGlicmFyeShzY2F0dGVycGxvdDNkKQ0KbGlicmFyeShkcGx5cikNCmxpYnJhcnkocmVhZHIpDQpkYXRhc2V0IDwtIHJlYWRfY3N2KCJzYWxhcnkuY3N2IikNClZpZXcoZGF0YXNldCkNCmBgYA0KU2FtcGxlIG9mIHJhdyBkYXRhc2V0IGFuZCBzdW1tYXJ5IA0KYGBge3J9DQpWaWV3KGRhdGFzZXQpDQpzdW1tYXJ5KGRhdGFzZXQpDQpgYGANCmVuY29kaW5nIA0KYGBge3J9DQpkYXRhc2V0JHdvcmtjbGFzcyA8LSAgYXMuaW50ZWdlcihmYWN0b3IoZGF0YXNldCR3b3JrY2xhc3MpKQ0KZGF0YXNldCRtYXJpdGFsLnN0YXR1cyA8LSAgYXMuaW50ZWdlcihmYWN0b3IoZGF0YXNldCRgbWFyaXRhbC1zdGF0dXNgKSkNCmRhdGFzZXQkb2NjdXBhdGlvbiA8LSAgYXMuaW50ZWdlcihmYWN0b3IoZGF0YXNldCRvY2N1cGF0aW9uKSkNCmRhdGFzZXQkcmVsYXRpb25zaGlwIDwtICBhcy5pbnRlZ2VyKGZhY3RvcihkYXRhc2V0JHdvcmtjbGFzcykpDQpkYXRhc2V0JHJhY2UgPC0gIGFzLmludGVnZXIoZmFjdG9yKGRhdGFzZXQkcmFjZSkpDQpkYXRhc2V0JHNleCA8LSAgYXMuaW50ZWdlcihmYWN0b3IoZGF0YXNldCRzZXgpKQ0KZGF0YXNldCRuYXRpdmUuY291bnRyeSA8LSAgYXMuaW50ZWdlcihmYWN0b3IoZGF0YXNldCRgbmF0aXZlLWNvdW50cnlgKSkNCnByaW50KGRhdGFzZXQpDQpgYGANCg0KIE1pc3NpbmcgdmFsdWVzDQpgYGB7cn0NCnN1bShpcy5uYShkYXRhc2V0KSkNCmBgYA0KIHdlIG5vdGljZWQgdGhhdCB0aGVyZSBpcyBhIHF1ZXN0aW9uIG1hcmsgaW4gc29tZSB2YWx1ZXMgYWx0aG91Z2ggd2UgY2hlY2tlZCB0aGUgbWlzc2luZyB2YWx1ZXMgaW4gcHJldmlvdXMgcGFydCBhbmQgdGhlIHJlc2F1bHQgd2FzIDAgc28gd2UgYXJlIGdvaW5nIHRvIGNsZWFuIHRoZW0gYnkgZGVsZXRpbmcgdGhlIHJvdw0KYGBge3J9DQpkYXRhc2V0IDwtIGRhdGFzZXRbIWFwcGx5KGRhdGFzZXQgPT0gIj8iLCAxLCBhbnkpLCBdDQpwcmludChkYXRhc2V0KQ0KYGBgDQpyZW1vdmluZyBvdXRsaWVycw0KYGBge3J9DQpPdXRBZ2UgPSBvdXRsaWVyKGRhdGFzZXQkYWdlLCBsb2dpY2FsID1UUlVFKQ0Kc3VtKE91dEFnZSkNCkZpbmRfb3V0bGllciA9IHdoaWNoKE91dEFnZSA9PVRSVUUsIGFyci5pbmQgPSBUUlVFKQ0KT3V0QWdlDQpGaW5kX291dGxpZXINCiMjIyMNCk91dGZubHdndCA9IG91dGxpZXIoZGF0YXNldCRmbmx3Z3QsIGxvZ2ljYWwgPVRSVUUpDQpzdW0oT3V0Zm5sd2d0KQ0KRmluZF9vdXRsaWVyID0gd2hpY2goT3V0Zm5sd2d0ID09VFJVRSwgYXJyLmluZCA9IFRSVUUpDQpPdXRmbmx3Z3QNCiMjIw0KT3V0ZWR1Y2F0aW9uID0gb3V0bGllcihkYXRhc2V0JGBlZHVjYXRpb24tbnVtYCwgbG9naWNhbCA9VFJVRSkNCnN1bShPdXRlZHVjYXRpb24pDQpGaW5kX291dGxpZXIgPSB3aGljaChPdXRlZHVjYXRpb24gPT1UUlVFLCBhcnIuaW5kID0gVFJVRSkNCk91dGVkdWNhdGlvbg0KIyMNCg0KT3V0aG91cnMgPSBvdXRsaWVyKGRhdGFzZXQkYGhvdXJzLXBlci13ZWVrYCwgbG9naWNhbCA9VFJVRSkNCnN1bShPdXRob3VycykNCkZpbmRfb3V0bGllciA9IHdoaWNoKE91dGhvdXJzID09VFJVRSwgYXJyLmluZCA9IFRSVUUpDQpPdXRob3Vycw0KIyMjDQpPdXRjYXBpdGFsRyA9IG91dGxpZXIoZGF0YXNldCRgY2FwaXRhbC1nYWluYCwgbG9naWNhbCA9VFJVRSkNCnN1bShPdXRjYXBpdGFsRykNCkZpbmRfb3V0bGllciA9IHdoaWNoKE91dGNhcGl0YWxHID09VFJVRSwgYXJyLmluZCA9IFRSVUUpDQpPdXRjYXBpdGFsRw0KIyMjDQpPdXRjYXBpdGFsTCA9IG91dGxpZXIoZGF0YXNldCRgY2FwaXRhbC1sb3NzYCwgbG9naWNhbCA9VFJVRSkNCnN1bShPdXRjYXBpdGFsTCkNCkZpbmRfb3V0bGllciA9IHdoaWNoKE91dGNhcGl0YWxMID09VFJVRSwgYXJyLmluZCA9IFRSVUUpDQpPdXRjYXBpdGFsTA0KDQoNCiNSZW1vdmUgb3V0bGllcg0KZGF0YXNldD0gZGF0YXNldFstRmluZF9vdXRsaWVyLF0NCg0KYGBgDQpwcmludGluZyB0aGUgZGF0YXNldCBhZnRlciBjbGVhbmluZyB0aGUgZGF0YQ0KYGBge3J9DQpwcmludChkYXRhc2V0KQ0KYGBgDQoNCkNyZWF0ZSBhIG5ldyBjb2x1bW4gY2FsbGVkIG51bV9zYWxhcnkgdG8gdHJhbnNmb3JtIHRoZSBiaW5hcnkgYXR0cmlidXRlIGludG8gbnVtcmljYWwgdG8gdXNlIGl0IGJldHRlciBhcyBpdCBpdCB0aGUgY2xhc3MgbGFiZWwNCmBgYHtyfQ0KZGF0YXNldCRudW1fc2FsYXJ5IDwtIGlmZWxzZShkYXRhc2V0JHNhbGFyeSA9PSAiPjUwSyIsIDEsIDApDQoNCmBgYA0KRGF0YSBzdW1tYXJ5DQpgYGB7cn0NCnN1bW1hcnkoZGF0YXNldCRhZ2UpDQpzdW1tYXJ5KGRhdGFzZXQkYGhvdXJzLXBlci13ZWVrYCkNCnN1bW1hcnkoZGF0YXNldCRlZHVjYXRpb24pDQpzdW1tYXJ5KGRhdGFzZXQkb2NjdXBhdGlvbikNCnN1bW1hcnkoZGF0YXNldCRzZXgpDQpzdW1tYXJ5KGRhdGFzZXQkc2FsYXJ5KQ0KYGBgDQp2YXJpYW5jZSANCmBgYHtyfQ0KdmFyKGRhdGFzZXQkYWdlKQ0KdmFyKGRhdGFzZXQkYGhvdXJzLXBlci13ZWVrYCkNCmBgYA0KRGlzY3JldGl6ZSB0aGUgaG91cnMtcGVyLXdlZWsgaW50byB0aHJlZSBiaW5zDQpgYGB7cn0NCmRhdGFzZXQkaG91cnNfcGVyX3dlZWtfYmlubmVkIDwtIGN1dChkYXRhc2V0JGBob3Vycy1wZXItd2Vla2AsIGJyZWFrcyA9IGMoMCwgMzAsIDQwLCBJbmYpLCBsYWJlbHMgPSBjKCJMb3ciLCAiTWVkaXVtIiwgIkhpZ2giKSkNCnByaW50KGRhdGFzZXQkaG91cnNfcGVyX3dlZWtfYmlubmVkKQ0KYGBgDQpDcmVhdGUgYSBkZW5zaXR5IHBsb3QgZm9yIHRoZSBhZ2UgdmFyaWFibGUNCmBgYHtyfQ0KZ2dwbG90KGRhdGFzZXQsIGFlcyh4ID0gYWdlKSkgKw0KICBnZW9tX2RlbnNpdHkoKQ0KYGBgDQoNCg0KaGlzdG9ncmFtcw0KYGBge3J9DQojIEhpc3RvZ3JhbSBvZiB0aGUgYWdlIHZhcmlhYmxlDQpnZ3Bsb3QoZGF0YXNldCwgYWVzKHggPSBhZ2UpKSArDQogIGdlb21faGlzdG9ncmFtKCkNCg0KIyBIaXN0b2dyYW0gb2YgdGhlIG51bV9zYWxhcnkgdmFyaWFibGUgd2hlcmUgdGhlIDEgcmVwcmVzZW50cyBzYWxhcnkgPj01MGsgYW5kIDAgcmVwcmVzZW50cyBzYWxhcnkgPDUwaw0KZ2dwbG90KGRhdGFzZXQsIGFlcyh4ID0gbnVtX3NhbGFyeSkpICsNCiAgZ2VvbV9oaXN0b2dyYW0oKQ0KDQojIEhpc3RvZ3JhbSBvZiB0aGUgaG91cnMtcGVyLXdlZWsgdmFyaWFibGUNCmdncGxvdChkYXRhc2V0LCBhZXMoeCA9IGBob3Vycy1wZXItd2Vla2ApKSArDQogIGdlb21faGlzdG9ncmFtKCkNCg0KIyBIaXN0b2dyYW0gb2YgdGhlIGZubHdndCB2YXJpYWJsZQ0KZ2dwbG90KGRhdGFzZXQsIGFlcyh4ID0gZm5sd2d0KSkgKw0KICBnZW9tX2hpc3RvZ3JhbSgpDQoNCmBgYA0KDQpiYXIgcGxvdHMgDQpgYGB7cn0NCiMgQmFyIHBsb3Qgb2YgdGhlIHdvcmtjbGFzcyB2YXJpYWJsZQ0KZ2dwbG90KGRhdGFzZXQsIGFlcyh4ID0gd29ya2NsYXNzKSkgKyBnZW9tX2JhcigpDQoNCiMgQmFyIHBsb3Qgb2YgdGhlIGVkdWNhdGlvbiB2YXJpYWJsZQ0KZ2dwbG90KGRhdGFzZXQsIGFlcyh4ID0gZWR1Y2F0aW9uKSkgKyBnZW9tX2JhcigpDQoNCiMgQmFyIHBsb3Qgb2YgdGhlIG1hcml0YWwtc3RhdHVzIHZhcmlhYmxlDQpnZ3Bsb3QoZGF0YXNldCwgYWVzKHggPSBgbWFyaXRhbC1zdGF0dXNgKSkgKyBnZW9tX2JhcigpDQoNCiMgQmFyIHBsb3Qgb2YgdGhlIG9jY3VwYXRpb24gdmFyaWFibGUNCmdncGxvdChkYXRhc2V0LCBhZXMoeCA9IG9jY3VwYXRpb24pKSArIGdlb21fYmFyKCkNCg0KIyBCYXIgcGxvdCBvZiB0aGUgcmVsYXRpb25zaGlwIHZhcmlhYmxlDQpnZ3Bsb3QoZGF0YXNldCwgYWVzKHggPSByZWxhdGlvbnNoaXApKSArIGdlb21fYmFyKCkNCg0KIyBCYXIgcGxvdCBvZiB0aGUgc2V4IHZhcmlhYmxlDQpnZ3Bsb3QoZGF0YXNldCwgYWVzKHggPSBzZXgpKSArZ2VvbV9iYXIoKQ0KDQojIEJhciBwbG90IG9mIHRoZSBuYXRpdmUtY291bnRyeSB2YXJpYWJsZQ0KZ2dwbG90KGRhdGFzZXQsIGFlcyh4ID0gYG5hdGl2ZS1jb3VudHJ5YCkpICsgZ2VvbV9iYXIoKQ0KDQojIEJhciBwbG90IG9mIHRoZSBzYWxhcnkgdmFyaWFibGUNCmdncGxvdChkYXRhc2V0LCBhZXMoeCA9IHNhbGFyeSkpICsgZ2VvbV9iYXIoKQ0KYGBgDQoNCiBib3ggcGxvdA0KYGBge3J9DQpnZ3Bsb3QoZGF0YXNldCwgYWVzKHggPSBzYWxhcnksIHkgPSBgaG91cnMtcGVyLXdlZWtgKSkgKw0KICBnZW9tX2JveHBsb3QoKSArDQogIGxhYnModGl0bGUgPSAiQm94IFBsb3Qgb2YgU2FsYXJ5IGFuZCBIb3VycyBwZXIgV2VlayIsIHggPSAiU2FsYXJ5IiwgeSA9ICJIb3VycyBwZXIgV2VlayIpDQoNCg0KZ2dwbG90KGRhdGFzZXQsIGFlcyh4ID0gc2FsYXJ5LCB5ID0gYWdlKSkgKw0KICBnZW9tX2JveHBsb3QoKSArDQogIGxhYnModGl0bGUgPSAiQm94IFBsb3Qgb2YgQWdlIGFuZCBTYWxhcnkiLCB4ID0gInNhbGFyeSIsIHkgPSAiYWdlIikNCmBgYA0KDQpzY2F0dGVyIHBsb3QNCmBgYHtyfQ0Kc2NhdHRlcnBsb3QzZChkYXRhc2V0JG51bV9zYWxhcnksZGF0YXNldCRhZ2UsIGRhdGFzZXQkYGhvdXJzLXBlci13ZWVrYCkNCmBgYA0KDQpwaWUgY2hhcnQgZm9yIHRoZSBzYWxhcnkgYXR0cmlidXRlDQpgYGB7cn0NCnRhYiA8LSBkYXRhc2V0JHNhbGFyeSAlPiUgdGFibGUoKQ0KcHJlY2VudGFnZXMgPC0gdGFiICU+JSBwcm9wLnRhYmxlKCkgJT4lIHJvdW5kKDMpICogMTAwIA0KdHh0IDwtIHBhc3RlMChuYW1lcyh0YWIpLCAnXG4nLCBwcmVjZW50YWdlcywgJyUnKSANCnBpZSh0YWIsIGxhYmVscz10eHQpDQpgYGANCg0KTm9ybWFsaXphdGlvbg0KYGBge3J9DQpkYXRhV2l0aG91dE5vcm1hbGl6YXRpb24gPC0gZGF0YXNldA0KcHJpbnQoZGF0YVdpdGhvdXROb3JtYWxpemF0aW9uKQ0KI0RlZmluZSBmdW5jdGlvbsKgbm9ybWFsaXplKCkuDQpub3JtYWxpemUgPC0gZnVuY3Rpb24oeCkge3JldHVybiAoKHggLSBtaW4oeCkpIC8gKG1heCh4KSAtIG1pbih4KSkpfQ0KI0RlZmluZSBmdW5jdGlvbsKgWl9ub3JtYWxpemUoKS4NClpfbm9ybWFsaXplIDwtIGZ1bmN0aW9uKHgpIHtyZXR1cm4gKCh4IC0gbWVhbih4KSkgLyBzZCh4KSl9DQoNCiNDYWxsIG5vcm1hbGl6ZSBmdW5jcnRpb24gDQpkYXRhc2V0JGFnZTwtbm9ybWFsaXplKGRhdGFXaXRob3V0Tm9ybWFsaXphdGlvbiRhZ2UpDQpwcmludChkYXRhc2V0KQ0KDQojQ2FsbCBaX25vcm1hbGl6ZSBmdW5jcnRpb24gDQpkYXRhc2V0JGFnZTwtWl9ub3JtYWxpemUoZGF0YVdpdGhvdXROb3JtYWxpemF0aW9uJGFnZSkNCnByaW50KGRhdGFzZXQpDQoNCiMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjDQoNCiNDYWxsIG5vcm1hbGl6ZSBmdW5jcnRpb24gDQpkYXRhc2V0JGZubHdndDwtbm9ybWFsaXplKGRhdGFXaXRob3V0Tm9ybWFsaXphdGlvbiRmbmx3Z3QpDQpwcmludChkYXRhc2V0KQ0KDQojQ2FsbCBaX25vcm1hbGl6ZSBmdW5jcnRpb24gDQpkYXRhc2V0JGZubHdndDwtWl9ub3JtYWxpemUoZGF0YVdpdGhvdXROb3JtYWxpemF0aW9uJGZubHdndCkNCnByaW50KGRhdGFzZXQpDQoNCiMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjDQoNCiNDYWxsIG5vcm1hbGl6ZSBmdW5jcnRpb24gDQpkYXRhc2V0JGBlZHVjYXRpb24tbnVtYDwtbm9ybWFsaXplKGRhdGFXaXRob3V0Tm9ybWFsaXphdGlvbiRgZWR1Y2F0aW9uLW51bWApDQpwcmludChkYXRhc2V0KQ0KDQojQ2FsbCBaX25vcm1hbGl6ZSBmdW5jcnRpb24gDQpkYXRhc2V0JGBlZHVjYXRpb24tbnVtYDwtWl9ub3JtYWxpemUoZGF0YVdpdGhvdXROb3JtYWxpemF0aW9uJGBlZHVjYXRpb24tbnVtYCkNCnByaW50KGRhdGFzZXQpDQoNCiMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjDQoNCg0KDQojQ2FsbCBub3JtYWxpemUgZnVuY3J0aW9uIA0KZGF0YXNldCRgaG91cnMtcGVyLXdlZWtgPC1ub3JtYWxpemUoZGF0YVdpdGhvdXROb3JtYWxpemF0aW9uJGBob3Vycy1wZXItd2Vla2ApDQpwcmludChkYXRhc2V0KQ0KDQojQ2FsbCBaX25vcm1hbGl6ZSBmdW5jcnRpb24gDQpkYXRhc2V0JGBob3Vycy1wZXItd2Vla2A8LVpfbm9ybWFsaXplKGRhdGFXaXRob3V0Tm9ybWFsaXphdGlvbiRgaG91cnMtcGVyLXdlZWtgKQ0KcHJpbnQoZGF0YXNldCkNCg0KIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMNCg0KI0NhbGwgbm9ybWFsaXplIGZ1bmNydGlvbiANCmRhdGFzZXQkYGNhcGl0YWwtZ2FpbmA8LW5vcm1hbGl6ZShkYXRhV2l0aG91dE5vcm1hbGl6YXRpb24kYGNhcGl0YWwtZ2FpbmApDQpwcmludChkYXRhc2V0KQ0KDQojQ2FsbCBaX25vcm1hbGl6ZSBmdW5jcnRpb24gDQpkYXRhc2V0JGBjYXBpdGFsLWdhaW5gPC1aX25vcm1hbGl6ZShkYXRhV2l0aG91dE5vcm1hbGl6YXRpb24kYGNhcGl0YWwtZ2FpbmApDQpwcmludChkYXRhc2V0KQ0KDQojIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIyMjIw0KDQojQ2FsbCBub3JtYWxpemUgZnVuY3J0aW9uIA0KZGF0YXNldCRgY2FwaXRhbC1sb3NzYDwtbm9ybWFsaXplKGRhdGFXaXRob3V0Tm9ybWFsaXphdGlvbiRgY2FwaXRhbC1sb3NzYCkNCnByaW50KGRhdGFzZXQpDQoNCiNDYWxsIFpfbm9ybWFsaXplIGZ1bmNydGlvbiANCmRhdGFzZXQkYGNhcGl0YWwtbG9zc2A8LVpfbm9ybWFsaXplKGRhdGFXaXRob3V0Tm9ybWFsaXphdGlvbiRgY2FwaXRhbC1sb3NzYCkNCnByaW50KGRhdGFzZXQpDQoNCmBgYA0KDQoNCmBgYHtyfQ0KDQpgYGANCg==